@article{cotter2019JMLR,
  author  = {Andrew Cotter and Heinrich Jiang and Maya Gupta and Serena Wang and Taman Narayan and Seungil You and Karthik Sridharan},
  title   = {{Optimization with Non-Differentiable Constraints with Applications to Fairness, Recall, Churn, and Other Goals}},
  journal = {Journal of Machine Learning Research},
  year    = {2019},
  volume  = {20},
  number  = {172},
  pages   = {1-59},
  url     = {http://jmlr.org/papers/v20/18-616.html}
}
@book{boyd2004convex,
  title     = {{Convex Optimization}},
  author    = {Boyd, Stephen and Vandenberghe, Lieven},
  year      = {2004},
  publisher = {Cambridge University Press},
  url       = {https://web.stanford.edu/~boyd/cvxbook/bv_cvxbook.pdf}
}
@article{vonNeumann1928theorie,
  title     = {{Zur Theorie der Gesellschaftsspiele}},
  author    = {von Neumann, John},
  journal   = {{Mathematische Annalen}},
  volume    = {100},
  number    = {1},
  pages     = {295--320},
  year      = {1928},
  publisher = {Springer},
  url       = {https://cs.uwaterloo.ca/~y328yu/classics/vonNeumann.pdf}
}
@inproceedings{narasimhan2020multiplier,
  author    = {Narasimhan, Harikrishna and Cotter, Andrew and Zhou, Yichen and Wang, Serena and Guo, Wenshuo},
  title     = {Approximate Heavily-Constrained Learning with Lagrange Multiplier Models},
  booktitle = {NeurIPS},
  year      = {2020},
  url       = {https://proceedings.neurips.cc/paper/2020/hash/62db9e3397c76207a687c360e0243317-Abstract.html}
}
@article{korpelevich1976extragradient,
  title   = {{The extragradient method for finding saddle points and other problems}},
  author  = {Korpelevich, Galina M},
  journal = {Matecon},
  year    = {1976},
  url     = {https://cs.uwaterloo.ca/~y328yu/classics/extragrad.pdf}
}
@inproceedings{gidel2018variational,
  title     = {{A Variational Inequality Perspective on Generative Adversarial Networks}},
  author    = {Gidel, Gauthier and Berard, Hugo and Vignoud, Ga{\"e}tan and Vincent, Pascal and Lacoste-Julien, Simon},
  booktitle = {{ICLR}},
  year      = {2019},
  url       = {https://openreview.net/forum?id=r1laEnA5Ym}
}
@inproceedings{lin2020gradient,
  title     = {{On Gradient Descent Ascent for Nonconvex-Concave Minimax Problems}},
  author    = {Lin, Tianyi and Jin, Chi and Jordan, Michael},
  booktitle = {{ICML}},
  year      = {2020},
  url       = {https://proceedings.mlr.press/v119/lin20a.html}
}

@inproceedings{sutskever2013initialization,
  title     = {On the importance of initialization and momentum in deep learning},
  author    = {Sutskever, Ilya and Martens, James and Dahl, George and Hinton, Geoffrey},
  booktitle = {{ICML}},
  year      = {2013},
  url       = {https://proceedings.mlr.press/v28/sutskever13.html}
}
@inproceedings{reddi2018amsgrad,
  title     = {On the Convergence of Adam and Beyondg},
  author    = {Reddi, Sashank J. and Kale, Satyen and Kumar, Sanjiv},
  booktitle = {{ICLR}},
  year      = {2018},
  url       = {https://openreview.net/forum?id=r1laEnA5Ym}
}
